Cream of the Crop 3

home *** CD-ROM | disk | FTP | other *** search

/ Cream of the Crop 3 / Cream of the Crop 3.iso / comm / wnos5src.zip / LZW.C < prev next >

Wrap

Text File | 1993-10-19 | 15KB | 607 lines

/* SM0RGV data compression routines. * This file implements the Lempel-Ziv Welch (LZW) data compression * algorithm but with a variable code size, as in GIF format files. * * Copyright 1990 by Anders Klemets, SM0RGV. * Permission granted for non-commercial distribution only. */ #include "global.h" #include "config.h" #ifdef LZW #include "mbuf.h" #include "proc.h" #include "lzw.h" #include "usock.h" #include "session.h" #include "cmdparse.h" #include <ctype.h> static void near fastencode __ARGS((struct usock *up,char data)); static void near morebits __ARGS((struct lzw *lzw)); static void near cleartbl __ARGS((struct lzw *lzw)); static void near addtobuffer __ARGS((struct usock *up,int32 code)); static void near decodetbl __ARGS((int32 code,struct lzw *lzw)); static int32 near nextcode __ARGS((struct usock *up)); int dolzw(int argc,char **argv,void *p) { switch(*argv[1]) { case 'm': if(argc == 2) { tprintf("LZW mode: %s\n",Lzwmode ? "fast" : "compact"); return 0; } else { switch(*argv[2]) { case 'f': Lzwmode = LZWFAST; return 0; case 'c': Lzwmode = LZWCOMPACT; return 0; default: tputs("Usage: lzw mode <fast|compact>\n"); return -1; } } case 'b': return setintrc(&Lzwbits,"LZW bits",--argc,++argv,9,16); case '+': if(argc == 3) { struct session *sp; if((sp = sessptr(argv[2])) != NULLSESSION) { lzwinit(sp->s,Lzwbits,Lzwmode); } } return 0; } return -1; } /* Initialize a socket for compression. Bits specifies the maximum number * of bits per codeword. The input and output code tables might grow to * about (2^bits * 3) bytes each. The bits parameter does only serve as a * recommendation for the decoding, the actual number of bits may be * larger, but not never more than 16. */ void lzwinit( int s, /* socket to operate on */ int bits, /* maximum number of bits per codeword */ int mode) /* compression mode, LZWCOMPACT or LZWFAST */ { struct usock *up; if((up = itop(s)) == NULLUSOCK) { return; } up->zout = mxallocw(sizeof(struct lzw)); up->zin = mxallocw(sizeof(struct lzw)); up->zout->codebits = LZWBITS; if(bits < LZWBITS) { up->zout->maxbits = LZWBITS; } if(bits > 16 || bits == 0) { up->zout->maxbits = 16; } if(bits >= LZWBITS && bits <= 16) { up->zout->maxbits = bits; } up->zout->nextbit = 0; up->zout->prefix = -1; up->zout->version = -1; up->zout->code = -1; up->zout->mode = (mode & 1); /* only the last bit is significant */ up->zout->next = ZFLUSH + 1; /* used only in LZWFAST mode */ up->zin->codebits = LZWBITS; up->zin->maxbits = -1; up->zin->nextbit = 0; up->zin->prefix = -1; up->zin->version = -1; up->zin->code = -1; up->zin->mode = LZWCOMPACT; up->zin->next = ZFLUSH + 1; up->zin->buf = NULLBUF; } void lzwfree(struct usock *up) { if(up->zout != NULLLZW) { cleartbl(up->zout); xfree(up->zout); up->zout = NULLLZW; } if(up->zin != NULLLZW) { cleartbl(up->zin); free_q(&up->zin->buf); xfree(up->zin); up->zin = NULLLZW; } } /* LZW encoding routine. * See if the string specified by code + data is in the string table. If so, * set prefix equal to the code of that string. Otherwise insert code + data * in the string and set prefix equal to data. */ void lzwencode(int s,char data) { struct usock *up; struct lzw *lzw; int32 code, pagelim; unsigned int i,j; if((up = itop(s)) == NULLUSOCK) { return; } lzw = up->zout; code = up->zout->prefix; /* the first byte sent will be the version number */ if(lzw->version == -1) { lzw->version = ZVERSION; up->obuf->data[up->obuf->cnt++] = lzw->version; /* then send our recommended maximum number of codebits */ up->obuf->data[up->obuf->cnt++] = lzw->maxbits; } lzw->cnt++; if(code == -1) { lzw->prefix = (int32)uchar(data); return; } if(lzw->mode == LZWFAST) { fastencode(up,data); return; } pagelim = ((int32) 1 << lzw->codebits) / LZWBLK + 1; if(code <= ZFLUSH) { i = j = 0; } else { i = (unsigned int)((code - ZFLUSH) / LZWBLK); j = (unsigned int)((code - ZFLUSH) % LZWBLK); } if(lzw->tu.tbl == NULL) { lzw->tu.tbl = cxallocw((unsigned)pagelim,sizeof(struct zentry *)); } for(;;) { if(itop(s) == NULLUSOCK) { /* the connection has been closed */ return; } if(up->zout == NULLLZW) { /* ...or is about to be closed */ return; } if(lzw->tu.tbl[i] == (struct zentry *)0) { lzw->tu.tbl[i] = cxallocw(LZWBLK,sizeof(struct zentry)); memset(lzw->tu.tbl[i],0xff,LZWBLK * sizeof(struct zentry)); } while(j < LZWBLK) { if(lzw->tu.tbl[i][j].data == data && lzw->tu.tbl[i][j].code == (int16)code) { lzw->prefix = (int32)(i * LZWBLK + j + ZFLUSH + 1); return; } if(lzw->tu.tbl[i][j].code == 0xffff) { lzw->tu.tbl[i][j].code = (int16)code; lzw->tu.tbl[i][j].data = data; addtobuffer(up,code); lzw->prefix = (int32) uchar(data); lzw->next++; if(lzw->next == (int32) (1 << lzw->codebits)) { /* the current table is now full */ morebits(lzw); } if(lzw->next + 1 == (int32) (1 << lzw->maxbits)) { /* The last codeword has been reached. * (Or last - 1.) Signal this and start all * over again. */ addtobuffer(up,lzw->prefix); if(lzw->next + 1 == (int32) (1 << lzw->codebits)) { morebits(lzw); } addtobuffer(up,ZCC); cleartbl(lzw); } return; } ++j; } pwait(NULL); ++i; j = 0; } } /* Used when LZWFAST mode is selected. Memory usage approx. (2^bits * 5) * bytes. */ static void near fastencode(struct usock *up,char data) { struct zfast *z; struct mbuf *bp; int16 cnt, h; struct lzw *lzw = up->zout; int32 code = up->zout->prefix; if(lzw->tu.bpp == NULLBUFP) { lzw->tu.bpp = cxallocw(ZHASH,sizeof(struct mbuf *)); } h = lobyte(code); h ^= hibyte(code); h ^= data; h = h % ZHASH; if(lzw->tu.bpp[h] == NULLBUF) { lzw->tu.bpp[h] = alloc_mbuf(LZWBLK); } bp = lzw->tu.bpp[h]; cnt = bp->cnt / sizeof(struct zfast); z = (struct zfast *) bp->data; while(cnt > 0) { if(z->data == data && z->code == (int16)code) { lzw->prefix = (int32) z->owncode; return; } z++; if(--cnt == 0) { if(bp->next == NULLBUF) { break; } bp = bp->next; cnt = bp->cnt / sizeof(struct zfast); z = (struct zfast *) bp->data; } } if(bp->size - bp->cnt >= sizeof(struct zfast)) { z = (struct zfast *) &bp->data[bp->cnt]; bp->cnt += sizeof(struct zfast); } else { bp->next = alloc_mbuf(LZWBLK); z = (struct zfast *) bp->next->data; bp->next->cnt = sizeof(struct zfast); } z->code = (int16)code; z->data = data; z->owncode = (int16)lzw->next++; addtobuffer(up,code); lzw->prefix = (int32) uchar(data); if(lzw->next == (int32) (1 << lzw->codebits)) { /* Increase the number of bits per codeword */ morebits(lzw); } if(lzw->next + 1 == (int32) (1 << lzw->maxbits)) { /* The last codeword has been reached. (Or last - 1.) * Signal this and start all over again. */ addtobuffer(up,lzw->prefix); if(lzw->next + 1 == (int32) (1 << lzw->codebits)) { morebits(lzw); } addtobuffer(up,ZCC); cleartbl(lzw); } pwait(NULL); } /* increase the number of significant bits in the codewords, and increase * the size of the string table accordingly. */ static void near morebits(struct lzw *lzw) { lzw->codebits++; if(lzw->mode != LZWFAST) { int32 oldp = ((int32) 1 << lzw->codebits) / LZWBLK + 1; int32 pagelim = ((int32) 1 << lzw->codebits) / LZWBLK + 1; struct zentry **newt = cxallocw((int)pagelim,sizeof(struct zentry *)); memcpy(newt,lzw->tu.tbl,sizeof(struct zentry *) * (int)oldp); xfree(lzw->tu.tbl); lzw->tu.tbl = newt; } } static void near cleartbl(struct lzw *lzw) { int32 i; lzw->codebits = LZWBITS; lzw->prefix = -1; lzw->next = ZFLUSH + 1; if(lzw->tu.p == NULL) { return; } if(lzw->mode == LZWCOMPACT) { int32 pagelim = ((int32) 1 << lzw->codebits) / LZWBLK + 1; for(i = 0; i < pagelim; ++i) { xfree(lzw->tu.tbl[(int)i]); } } else { for(i = 0; i < ZHASH; ++i) { free_p(lzw->tu.bpp[(int)i]); } } xfree(lzw->tu.p); lzw->tu.p = NULL; } /* Add a codeword to the code stream. Nextbit indicates at which bit in the * code stream should be written first. The codeword ZFLUSH is used to * pad the buffer to a byte boundary when the buffer will be flushed. * The remaining bits of the ZFLUSH codeword are sent in the next buffer. */ static void near addtobuffer(struct usock *up,int32 code) { if(up->zout->code != -1) { /* Insert remaining bits of ZFLUSH codeword */ up->obuf->data[up->obuf->cnt] = up->zout->code >> up->zout->flushbit; if(up->zout->flushbit + 8 >= up->zout->codebits) { /* done */ up->zout->nextbit = (up->zout->codebits - up->zout->flushbit) % 8; if(up->zout->nextbit == 0) { ++up->obuf->cnt; } up->zout->code = -1; } else { /* not done yet */ ++up->obuf->cnt; up->zout->flushbit += 8; addtobuffer(up,code); return; } } /* normal codewords are treated here */ if(up->zout->nextbit == 0) { /* we are at a byte boundary */ if(code == ZFLUSH) { up->zout->flushbit = 0; up->zout->code = ZFLUSH; return; } up->obuf->data[up->obuf->cnt++] = code; } else { up->obuf->data[up->obuf->cnt++] |= code << up->zout->nextbit; } if(code == ZFLUSH) { /* interrupt here and save the rest of the ZFLUSH * codeword for later. */ up->zout->flushbit = 8 - up->zout->nextbit; up->zout->code = ZFLUSH; return; } up->obuf->data[up->obuf->cnt] = code >> (8 - up->zout->nextbit); /* start on a third byte if necessary */ if(16 - up->zout->nextbit < up->zout->codebits) { up->obuf->data[++up->obuf->cnt] = code >> (16 - up->zout->nextbit); } up->zout->nextbit = (up->zout->nextbit + up->zout->codebits) % 8; if(up->zout->nextbit == 0) { ++up->obuf->cnt; } } void lzwflush(struct usock *up) { /* interrupt the encoding process and send the prefix codeword */ if(up->zout->prefix != -1) { addtobuffer(up,up->zout->prefix); if(up->zout->next + 1 == (int32) (1 << up->zout->codebits)) { morebits(up->zout); } up->zout->prefix = -1; } /* signal this by sending the ZFLUSH codeword */ addtobuffer(up,ZFLUSH); } int lzwdecode(struct usock *up) { int32 code, data; if(up->zin->version == -1 && (up->zin->version = PULLCHAR(&up->ibuf)) == -1) { return -1; } if(up->zin->maxbits == -1) { /* receive a recommended value for the maximum no of bits */ if((up->zin->maxbits = PULLCHAR(&up->ibuf)) == -1) { return -1; } if(up->zout->maxbits > up->zin->maxbits) { if(up->zout->codebits > up->zin->maxbits) { /* We are already using more bits than our * peer want us to, so clear the encoding * table immediately. */ addtobuffer(up,up->zout->prefix); if(up->zout->next + 1 == (int32) (1 << up->zout->codebits)) { morebits(up->zout); } addtobuffer(up,ZCC); cleartbl(up->zout); } up->zout->maxbits = up->zin->maxbits; } } for(;;) { if((data = PULLCHAR(&up->zin->buf)) != -1) { return (int)data; } if((code = nextcode(up)) == -1) { return -1; } decodetbl(code,up->zin); up->zin->cnt += len_p(up->zin->buf); pwait(NULL); /* TEST */ } } static void near getstring(int32 code,struct lzw *lzw) { for(;;) { int i, j; if(code < ZFLUSH) { lzw->buf = pushdown(lzw->buf,1); *lzw->buf->data = uchar(code); return; } i = (int)((code - ZFLUSH - 1) / LZWBLK); j = (int)((code - ZFLUSH - 1) % LZWBLK); lzw->buf = pushdown(lzw->buf,1); *lzw->buf->data = lzw->tu.tbl[i][j].data; code = (int32) lzw->tu.tbl[i][j].code; } } static char near firstchar(int32 code,struct lzw *lzw) { for(;;) { int i, j; if(code < ZFLUSH) { return uchar(code); } i = (int)((code - ZFLUSH - 1) / LZWBLK); j = (int)((code - ZFLUSH - 1) % LZWBLK); code = (int32) lzw->tu.tbl[i][j].code; } } static void near decodetbl(int32 code,struct lzw *lzw) { unsigned int i,j; int32 pagelim; if(code > lzw->next) { tprintf("LZW protocol error, process %s\n",Curproc->name); return; } if(lzw->buf == NULLBUF) { lzw->buf = alloc_mbuf(512); /* allow us to use pushdown() later */ lzw->buf->data += lzw->buf->size; } if(lzw->prefix == -1) { getstring(code,lzw); lzw->prefix = code; return; } pagelim = ((int32) 1 << lzw->codebits) / LZWBLK + 1; if(lzw->tu.tbl == NULL) { lzw->tu.tbl = cxallocw((unsigned)pagelim,sizeof(struct zentry *)); } if(code < ZFLUSH) { goto intable; } i = (unsigned int)((code - ZFLUSH - 1) / LZWBLK); j = (unsigned int)((code - ZFLUSH - 1) % LZWBLK); if(lzw->tu.tbl[i] == (struct zentry *)0) { lzw->tu.tbl[i] = cxallocw(LZWBLK,sizeof(struct zentry)); memset(lzw->tu.tbl[i], 0xff,LZWBLK * sizeof(struct zentry)); } if(lzw->tu.tbl[i][j].code == 0xffff) { lzw->tu.tbl[i][j].data = firstchar(lzw->prefix,lzw); lzw->tu.tbl[i][j].code = (int16)lzw->prefix; getstring(code,lzw); lzw->next = code + 1; lzw->prefix = code; if(lzw->next + 1 == (int32) (1 << lzw->codebits)) { morebits(lzw); } return; } intable: getstring(code,lzw); i = (unsigned int)((lzw->next - ZFLUSH - 1) / LZWBLK); j = (unsigned int)((lzw->next - ZFLUSH - 1) % LZWBLK); if(lzw->tu.tbl[i] == (struct zentry *)0) { lzw->tu.tbl[i] = cxallocw(LZWBLK,sizeof(struct zentry)); memset(lzw->tu.tbl[i], 0xff,LZWBLK * sizeof(struct zentry)); } lzw->tu.tbl[i][j].data = firstchar(code,lzw); lzw->tu.tbl[i][j].code = (int16)lzw->prefix; lzw->next++; lzw->prefix = code; if(lzw->next + 1 == (int32)(1 << lzw->codebits)) { morebits(lzw); } } /* extract the next codeword from the input stream */ static int32 near nextcode(struct usock *up) { int32 code; if(up->zin->code == -1) { /* read the first character */ if((code = PULLCHAR(&up->ibuf)) == -1) { return -1; } up->zin->code = (code >> up->zin->nextbit); } if(up->ibuf == NULLBUF) { /* next byte is not available yet */ return -1; } /* continue assembling the codeword */ up->zin->code |= ((int32) uchar(*up->ibuf->data) << (8 - up->zin->nextbit)) & (((int32) 1 << up->zin->codebits) - 1); if((16 - up->zin->nextbit) < up->zin->codebits) { PULLCHAR(&up->ibuf); up->zin->nextbit -= 8; /* pull bits from a third byte */ return nextcode(up); } code = up->zin->code; up->zin->code = -1; up->zin->nextbit = (up->zin->nextbit + up->zin->codebits) % 8; if(up->zin->nextbit == 0) { PULLCHAR(&up->ibuf); } if(code == ZCC) { cleartbl(up->zin); return nextcode(up); } if(code == ZFLUSH) { up->zin->prefix = -1; return nextcode(up); } return code; } #endif /* LZW */